import matplotlib.pyplot as plt
import pandas as pd
from sklearn import model_selection
from sklearn.linear_model import LinearRegression
plt.rcParams['font.sans-serif']='Simhei'
df=pd.read_excel('最新发布的北京二手房数据_预处理.xlsx')
unit_price=df['单价（元/平方米）']
house_area=df['面积（平方米）']
house_type=df['室','厅']
house_regin=df[['通州','朝阳','昌平','顺义','丰台','海淀','西域','房山','石景山','大兴','怀柔','东城','门头沟','密云','延庆','平谷','亦庄开发区']]
house_finish=df[['毛坯','简装','精装']]
house_structure=df[['','','','']]
is_subway=df[['','']]
house_dirt=df[['','','','','','','','']]
house_year=df['']
x=pd.concat([house_area,house_type,house_regin,house_finish,house_structure,is_subway,house_dirt,house_year],axis=1)
y=unit_price